#!/usr/bin/env python
# -*- coding:utf-8 -*-
import json

from bs4 import BeautifulSoup

from crawler.parse_util import parse_basesic

base_path = '/home/rocky/workfile/gongshang_html/liaoning.html'
import codecs
def test():
    html = codecs.open(base_path,encoding='utf-8').read()
    soup = BeautifulSoup(html,'html5lib')
    result = parse_basesic.parse_basesic(soup)
    print json.dumps(result,ensure_ascii=False)

if __name__ == "__main__":
    test()
